{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "5f93b7d1",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/zhy/anaconda3/envs/mathglm/lib/python3.9/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
      "  from .autonotebook import tqdm as notebook_tqdm\n",
      "Building prefix dict from the default dictionary ...\n",
      "Loading model from cache /tmp/jieba.cache\n",
      "Loading model cost 0.355 seconds.\n",
      "Prefix dict has been built successfully.\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "import mindspore\n",
    "from mindnlp.transformers import AutoModelForSeq2SeqLM\n",
    "from mindnlp.peft import get_peft_config, get_peft_model, get_peft_model_state_dict, LoraConfig, TaskType,IA3Config\n",
    "from mindnlp.dataset import load_dataset\n",
    "from mindnlp.core import ops\n",
    "\n",
    "from mindnlp.transformers import AutoTokenizer\n",
    "from mindnlp.common.optimization import get_linear_schedule_with_warmup\n",
    "from tqdm import tqdm\n",
    "\n",
    "model_name_or_path = \"bigscience/mt0-small\"\n",
    "tokenizer_name_or_path = \"bigscience/mt0-small\"\n",
    "\n",
    "checkpoint_name = \"financial_sentiment_analysis_lora_v1.ckpt\"\n",
    "max_length = 128\n",
    "lr = 1e-3\n",
    "num_epochs = 3\n",
    "batch_size = 8"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "8d0850ac",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "trainable params: 34,816 || all params: 300,211,584 || trainable%: 0.011597154092494979\n"
     ]
    }
   ],
   "source": [
    "# creating model\n",
    "peft_config = IA3Config(task_type=TaskType.SEQ_2_SEQ_LM, inference_mode=False)\n",
    "\n",
    "model = AutoModelForSeq2SeqLM.from_pretrained(model_name_or_path)\n",
    "\n",
    "model = get_peft_model(model, peft_config)\n",
    "model.print_trainable_parameters()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "4ee2babf",
   "metadata": {},
   "outputs": [],
   "source": [
    "mindspore.dataset.config.set_seed(123)\n",
    "# loading dataset\n",
    "dataset = load_dataset(\"financial_phrasebank\", \"sentences_allagree\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "d1ecd7a0-2e48-405e-940b-001a96ccc18f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['negative', 'neutral', 'positive']"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "classes = dataset.source.ds.features[\"label\"].names\n",
    "classes"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "8cbbf475-89b6-4368-a7eb-730dc532558e",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[WARNING] ME(2239031:136174956483520,MainProcess):2024-08-30-02:00:03.914.752 [mindspore/dataset/engine/datasets.py:1203] Dataset is shuffled before split.\n"
     ]
    }
   ],
   "source": [
    "train_dataset, validation_dataset = dataset.shuffle(64).split([0.9, 0.1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "a89748b4-3193-4419-be39-2dd7907e349e",
   "metadata": {},
   "outputs": [],
   "source": [
    "def add_text_label(sentence, label):\n",
    "    return sentence, label, classes[label.item()]\n",
    "\n",
    "train_dataset = train_dataset.map(add_text_label, ['sentence', 'label'], ['sentence', 'label', 'text_label'])\n",
    "validation_dataset = validation_dataset.map(add_text_label, ['sentence', 'label'], ['sentence', 'label', 'text_label'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "396f46c4-45ba-4d45-a98f-fff173038b5b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'sentence': Tensor(shape=[], dtype=String, value= 'The gross area of the Innova 2 project will be about 10,000 sq m ( 107,600 sq ft ) .'),\n",
       " 'label': Tensor(shape=[], dtype=Int64, value= 1),\n",
       " 'text_label': Tensor(shape=[], dtype=String, value= 'neutral')}"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "next(train_dataset.create_dict_iterator())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "603ea9ef-88dd-4c8e-bd10-df7a64940b01",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/zhy/anaconda3/envs/mathglm/lib/python3.9/site-packages/mindnlp/transformers/tokenization_utils_base.py:1526: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted, and will be then set to `False` by default. \n",
      "  warnings.warn(\n"
     ]
    }
   ],
   "source": [
    "tokenizer = AutoTokenizer.from_pretrained(model_name_or_path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "86d29e1a-eb31-48bf-a6e3-bc3cfa26cde5",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "from mindnlp.dataset import BaseMapFunction\n",
    "from threading import Lock\n",
    "lock = Lock()\n",
    "\n",
    "class MapFunc(BaseMapFunction):\n",
    "    def __call__(self, sentence, label, text_label):\n",
    "        lock.acquire()\n",
    "        model_inputs = tokenizer(sentence, max_length=max_length, padding=\"max_length\", truncation=True)\n",
    "        labels = tokenizer(text_label, max_length=3, padding=\"max_length\", truncation=True)\n",
    "        lock.release()\n",
    "        labels = labels['input_ids']\n",
    "        labels = np.where(np.equal(labels, tokenizer.pad_token_id), -100, labels)\n",
    "        return model_inputs['input_ids'], model_inputs['attention_mask'], labels\n",
    "\n",
    "\n",
    "def get_dataset(dataset, tokenizer, shuffle=True):\n",
    "    input_colums=['sentence', 'label', 'text_label']\n",
    "    output_columns=['input_ids', 'attention_mask', 'labels']\n",
    "    dataset = dataset.map(MapFunc(input_colums, output_columns),\n",
    "                          input_colums, output_columns)\n",
    "    if shuffle:\n",
    "        dataset = dataset.shuffle(64)\n",
    "    dataset = dataset.batch(batch_size)\n",
    "    return dataset\n",
    "\n",
    "train_dataset = get_dataset(train_dataset, tokenizer)\n",
    "eval_dataset = get_dataset(validation_dataset, tokenizer, shuffle=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "f733a3c6",
   "metadata": {},
   "outputs": [],
   "source": [
    "from mindnlp.core import optim\n",
    "# optimizer and lr scheduler\n",
    "optimizer = optim.AdamW(model.trainable_params(), lr=lr)\n",
    "lr_scheduler = get_linear_schedule_with_warmup(\n",
    "    optimizer=optimizer,\n",
    "    num_warmup_steps=0,\n",
    "    num_training_steps=(len(train_dataset) * num_epochs),\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6b3a4090",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 255/255 [08:08<00:00,  1.92s/it]\n",
      "100%|██████████| 29/29 [00:03<00:00,  8.71it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "epoch=0: train_ppl=Tensor(shape=[], dtype=Float32, value= 61.4079) train_epoch_loss=Tensor(shape=[], dtype=Float32, value= 4.11754) eval_ppl=Tensor(shape=[], dtype=Float32, value= 9.69296) eval_epoch_loss=Tensor(shape=[], dtype=Float32, value= 2.2714)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 255/255 [20:42<00:00,  4.87s/it]\n",
      "100%|██████████| 29/29 [00:03<00:00,  8.99it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "epoch=1: train_ppl=Tensor(shape=[], dtype=Float32, value= 4.64922) train_epoch_loss=Tensor(shape=[], dtype=Float32, value= 1.5367) eval_ppl=Tensor(shape=[], dtype=Float32, value= 2.10834) eval_epoch_loss=Tensor(shape=[], dtype=Float32, value= 0.745899)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 255/255 [55:08<00:00, 12.97s/it] \n",
      "100%|██████████| 29/29 [00:03<00:00,  8.90it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "epoch=2: train_ppl=Tensor(shape=[], dtype=Float32, value= 2.02265) train_epoch_loss=Tensor(shape=[], dtype=Float32, value= 0.704408) eval_ppl=Tensor(shape=[], dtype=Float32, value= 1.66013) eval_epoch_loss=Tensor(shape=[], dtype=Float32, value= 0.506895)\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    }
   ],
   "source": [
    "from mindnlp.core import value_and_grad\n",
    "# training and evaluation\n",
    "def forward_fn(**batch):\n",
    "    outputs = model(**batch)\n",
    "    loss = outputs.loss\n",
    "    return loss\n",
    "\n",
    "grad_fn = value_and_grad(forward_fn, model.trainable_params())\n",
    "\n",
    "for epoch in range(num_epochs):\n",
    "    model.set_train()\n",
    "    total_loss = 0\n",
    "    train_total_size = train_dataset.get_dataset_size()\n",
    "    for step, batch in enumerate(tqdm(train_dataset.create_dict_iterator(), total=train_total_size)):\n",
    "        optimizer.zero_grad()\n",
    "        loss = grad_fn(**batch)\n",
    "        optimizer.step()\n",
    "        total_loss += loss.float()\n",
    "        lr_scheduler.step()\n",
    "\n",
    "    model.set_train(False)\n",
    "    eval_loss = 0\n",
    "    eval_preds = []\n",
    "    eval_total_size = eval_dataset.get_dataset_size()\n",
    "    for step, batch in enumerate(tqdm(eval_dataset.create_dict_iterator(), total=eval_total_size)):\n",
    "        with mindspore._no_grad():\n",
    "            outputs = model(**batch)\n",
    "        loss = outputs.loss\n",
    "        eval_loss += loss.float()\n",
    "        eval_preds.extend(\n",
    "            tokenizer.batch_decode(ops.argmax(outputs.logits, -1).asnumpy(), skip_special_tokens=True)\n",
    "        )\n",
    "\n",
    "    eval_epoch_loss = eval_loss / len(eval_dataset)\n",
    "    eval_ppl = ops.exp(eval_epoch_loss)\n",
    "    train_epoch_loss = total_loss / len(train_dataset)\n",
    "    train_ppl = ops.exp(train_epoch_loss)\n",
    "    print(f\"{epoch=}: {train_ppl=} {train_epoch_loss=} {eval_ppl=} {eval_epoch_loss=}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "6cafa67b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "accuracy=67.69911504424779 % on the evaluation dataset\n",
      "eval_preds[:10]=['neutral', 'neutral', 'neutral', 'neutral', 'neutral', 'neutral', '', 'positive', 'positive', 'neutral']\n",
      "ground_truth[:10]=['neutral', 'neutral', 'neutral', 'neutral', 'positive', 'neutral', 'neutral', 'positive', 'positive', 'positive']\n"
     ]
    }
   ],
   "source": [
    "# print accuracy\n",
    "correct = 0\n",
    "total = 0\n",
    "\n",
    "ground_truth = []\n",
    "\n",
    "for pred, data in zip(eval_preds, validation_dataset.create_dict_iterator(output_numpy=True)):\n",
    "    true = str(data['text_label'])\n",
    "    ground_truth.append(true)\n",
    "    if pred.strip() == true.strip():\n",
    "        correct += 1\n",
    "    total += 1\n",
    "accuracy = correct / total * 100\n",
    "print(f\"{accuracy=} % on the evaluation dataset\")\n",
    "print(f\"{eval_preds[:10]=}\")\n",
    "print(f\"{ground_truth[:10]=}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "26e88eb1-3d24-488b-ad62-0c18b81b861e",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[Tensor(shape=[8, 128], dtype=Int64, value=\n",
       " [[   486,   2733,   6396 ...      0,      0,      0],\n",
       "  [   486,    259, 150106 ...      0,      0,      0],\n",
       "  [   486,   5835,    259 ...      0,      0,      0],\n",
       "  ...\n",
       "  [  1385,    339,    259 ...      0,      0,      0],\n",
       "  [   259,  18948,    776 ...      0,      0,      0],\n",
       "  [   486,    259,  20147 ...      0,      0,      0]]),\n",
       " Tensor(shape=[8, 128], dtype=Int64, value=\n",
       " [[1, 1, 1 ... 0, 0, 0],\n",
       "  [1, 1, 1 ... 0, 0, 0],\n",
       "  [1, 1, 1 ... 0, 0, 0],\n",
       "  ...\n",
       "  [1, 1, 1 ... 0, 0, 0],\n",
       "  [1, 1, 1 ... 0, 0, 0],\n",
       "  [1, 1, 1 ... 0, 0, 0]]),\n",
       " Tensor(shape=[8, 3], dtype=Int64, value=\n",
       " [[59006,     1,  -100],\n",
       "  [59006,     1,  -100],\n",
       "  [59006,     1,  -100],\n",
       "  ...\n",
       "  [59006,     1,  -100],\n",
       "  [59006,     1,  -100],\n",
       "  [18205,     1,  -100]])]"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "next(eval_dataset.create_tuple_iterator())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "a8de6005",
   "metadata": {},
   "outputs": [],
   "source": [
    "# saving model\n",
    "peft_model_id = f\"{model_name_or_path}_{peft_config.peft_type}_{peft_config.task_type}\"\n",
    "model.save_pretrained(peft_model_id)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "bd20cd4c",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
      "To disable this warning, you can either:\n",
      "\t- Avoid using `tokenizers` before the fork if possible\n",
      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "9.1M\tbigscience/mt0-large_LORA_SEQ_2_SEQ_LM/adapter_model.ckpt\n"
     ]
    }
   ],
   "source": [
    "ckpt = f\"{peft_model_id}/adapter_model.ckpt\"\n",
    "!du -h $ckpt"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "76c2fc29",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.209.624 [mindspore/train/serialization.py:1378] For 'load_param_into_net', 558 parameters in the 'net' are not loaded, because they are not in the 'parameter_dict', please check whether the network structure is consistent when training and loading checkpoint.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.210.646 [mindspore/train/serialization.py:1383] base_model.shared.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.211.076 [mindspore/train/serialization.py:1383] base_model.encoder.block.0.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.211.434 [mindspore/train/serialization.py:1383] base_model.encoder.block.0.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.211.769 [mindspore/train/serialization.py:1383] base_model.encoder.block.0.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.212.116 [mindspore/train/serialization.py:1383] base_model.encoder.block.0.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.212.449 [mindspore/train/serialization.py:1383] base_model.encoder.block.0.layer.0.SelfAttention.relative_attention_bias.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.212.789 [mindspore/train/serialization.py:1383] base_model.encoder.block.0.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.213.142 [mindspore/train/serialization.py:1383] base_model.encoder.block.0.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.213.464 [mindspore/train/serialization.py:1383] base_model.encoder.block.0.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.213.805 [mindspore/train/serialization.py:1383] base_model.encoder.block.0.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.214.126 [mindspore/train/serialization.py:1383] base_model.encoder.block.0.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.214.458 [mindspore/train/serialization.py:1383] base_model.encoder.block.1.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.214.792 [mindspore/train/serialization.py:1383] base_model.encoder.block.1.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.215.131 [mindspore/train/serialization.py:1383] base_model.encoder.block.1.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.215.459 [mindspore/train/serialization.py:1383] base_model.encoder.block.1.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.215.770 [mindspore/train/serialization.py:1383] base_model.encoder.block.1.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.216.093 [mindspore/train/serialization.py:1383] base_model.encoder.block.1.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.217.102 [mindspore/train/serialization.py:1383] base_model.encoder.block.1.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.217.811 [mindspore/train/serialization.py:1383] base_model.encoder.block.1.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.218.153 [mindspore/train/serialization.py:1383] base_model.encoder.block.1.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.218.480 [mindspore/train/serialization.py:1383] base_model.encoder.block.2.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.218.829 [mindspore/train/serialization.py:1383] base_model.encoder.block.2.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.219.145 [mindspore/train/serialization.py:1383] base_model.encoder.block.2.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.219.475 [mindspore/train/serialization.py:1383] base_model.encoder.block.2.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.219.799 [mindspore/train/serialization.py:1383] base_model.encoder.block.2.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.220.134 [mindspore/train/serialization.py:1383] base_model.encoder.block.2.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.220.455 [mindspore/train/serialization.py:1383] base_model.encoder.block.2.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.220.778 [mindspore/train/serialization.py:1383] base_model.encoder.block.2.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.221.108 [mindspore/train/serialization.py:1383] base_model.encoder.block.2.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.221.455 [mindspore/train/serialization.py:1383] base_model.encoder.block.3.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.221.776 [mindspore/train/serialization.py:1383] base_model.encoder.block.3.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.222.099 [mindspore/train/serialization.py:1383] base_model.encoder.block.3.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.222.431 [mindspore/train/serialization.py:1383] base_model.encoder.block.3.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.222.766 [mindspore/train/serialization.py:1383] base_model.encoder.block.3.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.223.095 [mindspore/train/serialization.py:1383] base_model.encoder.block.3.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.223.413 [mindspore/train/serialization.py:1383] base_model.encoder.block.3.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.223.735 [mindspore/train/serialization.py:1383] base_model.encoder.block.3.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.224.060 [mindspore/train/serialization.py:1383] base_model.encoder.block.3.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.224.384 [mindspore/train/serialization.py:1383] base_model.encoder.block.4.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.224.709 [mindspore/train/serialization.py:1383] base_model.encoder.block.4.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.225.044 [mindspore/train/serialization.py:1383] base_model.encoder.block.4.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.225.374 [mindspore/train/serialization.py:1383] base_model.encoder.block.4.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.225.711 [mindspore/train/serialization.py:1383] base_model.encoder.block.4.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.226.042 [mindspore/train/serialization.py:1383] base_model.encoder.block.4.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.226.345 [mindspore/train/serialization.py:1383] base_model.encoder.block.4.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.226.676 [mindspore/train/serialization.py:1383] base_model.encoder.block.4.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.227.003 [mindspore/train/serialization.py:1383] base_model.encoder.block.4.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.227.304 [mindspore/train/serialization.py:1383] base_model.encoder.block.5.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.227.623 [mindspore/train/serialization.py:1383] base_model.encoder.block.5.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.227.965 [mindspore/train/serialization.py:1383] base_model.encoder.block.5.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.228.295 [mindspore/train/serialization.py:1383] base_model.encoder.block.5.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.228.616 [mindspore/train/serialization.py:1383] base_model.encoder.block.5.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.228.951 [mindspore/train/serialization.py:1383] base_model.encoder.block.5.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.229.280 [mindspore/train/serialization.py:1383] base_model.encoder.block.5.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.229.605 [mindspore/train/serialization.py:1383] base_model.encoder.block.5.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.229.927 [mindspore/train/serialization.py:1383] base_model.encoder.block.5.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.230.247 [mindspore/train/serialization.py:1383] base_model.encoder.block.6.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.230.573 [mindspore/train/serialization.py:1383] base_model.encoder.block.6.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.230.896 [mindspore/train/serialization.py:1383] base_model.encoder.block.6.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.231.234 [mindspore/train/serialization.py:1383] base_model.encoder.block.6.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.231.548 [mindspore/train/serialization.py:1383] base_model.encoder.block.6.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.231.880 [mindspore/train/serialization.py:1383] base_model.encoder.block.6.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.232.208 [mindspore/train/serialization.py:1383] base_model.encoder.block.6.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.232.537 [mindspore/train/serialization.py:1383] base_model.encoder.block.6.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.232.877 [mindspore/train/serialization.py:1383] base_model.encoder.block.6.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.233.196 [mindspore/train/serialization.py:1383] base_model.encoder.block.7.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.233.520 [mindspore/train/serialization.py:1383] base_model.encoder.block.7.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.233.859 [mindspore/train/serialization.py:1383] base_model.encoder.block.7.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.234.177 [mindspore/train/serialization.py:1383] base_model.encoder.block.7.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.234.498 [mindspore/train/serialization.py:1383] base_model.encoder.block.7.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.234.842 [mindspore/train/serialization.py:1383] base_model.encoder.block.7.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.235.153 [mindspore/train/serialization.py:1383] base_model.encoder.block.7.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.235.481 [mindspore/train/serialization.py:1383] base_model.encoder.block.7.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.235.807 [mindspore/train/serialization.py:1383] base_model.encoder.block.7.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.236.141 [mindspore/train/serialization.py:1383] base_model.encoder.block.8.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.236.463 [mindspore/train/serialization.py:1383] base_model.encoder.block.8.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.236.791 [mindspore/train/serialization.py:1383] base_model.encoder.block.8.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.237.134 [mindspore/train/serialization.py:1383] base_model.encoder.block.8.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.237.450 [mindspore/train/serialization.py:1383] base_model.encoder.block.8.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.237.776 [mindspore/train/serialization.py:1383] base_model.encoder.block.8.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.238.099 [mindspore/train/serialization.py:1383] base_model.encoder.block.8.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.238.434 [mindspore/train/serialization.py:1383] base_model.encoder.block.8.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.238.748 [mindspore/train/serialization.py:1383] base_model.encoder.block.8.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.239.085 [mindspore/train/serialization.py:1383] base_model.encoder.block.9.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.239.403 [mindspore/train/serialization.py:1383] base_model.encoder.block.9.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.239.710 [mindspore/train/serialization.py:1383] base_model.encoder.block.9.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.240.053 [mindspore/train/serialization.py:1383] base_model.encoder.block.9.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.240.363 [mindspore/train/serialization.py:1383] base_model.encoder.block.9.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.240.691 [mindspore/train/serialization.py:1383] base_model.encoder.block.9.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.241.019 [mindspore/train/serialization.py:1383] base_model.encoder.block.9.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.241.353 [mindspore/train/serialization.py:1383] base_model.encoder.block.9.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.241.695 [mindspore/train/serialization.py:1383] base_model.encoder.block.9.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.242.018 [mindspore/train/serialization.py:1383] base_model.encoder.block.10.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.242.352 [mindspore/train/serialization.py:1383] base_model.encoder.block.10.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.242.662 [mindspore/train/serialization.py:1383] base_model.encoder.block.10.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.242.999 [mindspore/train/serialization.py:1383] base_model.encoder.block.10.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.243.318 [mindspore/train/serialization.py:1383] base_model.encoder.block.10.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.243.645 [mindspore/train/serialization.py:1383] base_model.encoder.block.10.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.243.975 [mindspore/train/serialization.py:1383] base_model.encoder.block.10.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.244.309 [mindspore/train/serialization.py:1383] base_model.encoder.block.10.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.244.624 [mindspore/train/serialization.py:1383] base_model.encoder.block.10.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.244.950 [mindspore/train/serialization.py:1383] base_model.encoder.block.11.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.245.283 [mindspore/train/serialization.py:1383] base_model.encoder.block.11.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.245.618 [mindspore/train/serialization.py:1383] base_model.encoder.block.11.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.245.946 [mindspore/train/serialization.py:1383] base_model.encoder.block.11.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.246.288 [mindspore/train/serialization.py:1383] base_model.encoder.block.11.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.246.611 [mindspore/train/serialization.py:1383] base_model.encoder.block.11.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.246.948 [mindspore/train/serialization.py:1383] base_model.encoder.block.11.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.247.259 [mindspore/train/serialization.py:1383] base_model.encoder.block.11.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.247.595 [mindspore/train/serialization.py:1383] base_model.encoder.block.11.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.247.914 [mindspore/train/serialization.py:1383] base_model.encoder.block.12.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.248.234 [mindspore/train/serialization.py:1383] base_model.encoder.block.12.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.248.554 [mindspore/train/serialization.py:1383] base_model.encoder.block.12.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.248.885 [mindspore/train/serialization.py:1383] base_model.encoder.block.12.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.249.232 [mindspore/train/serialization.py:1383] base_model.encoder.block.12.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.249.545 [mindspore/train/serialization.py:1383] base_model.encoder.block.12.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.249.890 [mindspore/train/serialization.py:1383] base_model.encoder.block.12.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.250.215 [mindspore/train/serialization.py:1383] base_model.encoder.block.12.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.250.542 [mindspore/train/serialization.py:1383] base_model.encoder.block.12.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.250.862 [mindspore/train/serialization.py:1383] base_model.encoder.block.13.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.251.191 [mindspore/train/serialization.py:1383] base_model.encoder.block.13.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.251.515 [mindspore/train/serialization.py:1383] base_model.encoder.block.13.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.251.855 [mindspore/train/serialization.py:1383] base_model.encoder.block.13.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.252.180 [mindspore/train/serialization.py:1383] base_model.encoder.block.13.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.252.496 [mindspore/train/serialization.py:1383] base_model.encoder.block.13.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.252.835 [mindspore/train/serialization.py:1383] base_model.encoder.block.13.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.253.148 [mindspore/train/serialization.py:1383] base_model.encoder.block.13.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.253.498 [mindspore/train/serialization.py:1383] base_model.encoder.block.13.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.253.815 [mindspore/train/serialization.py:1383] base_model.encoder.block.14.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.254.529 [mindspore/train/serialization.py:1383] base_model.encoder.block.14.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.254.882 [mindspore/train/serialization.py:1383] base_model.encoder.block.14.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.255.229 [mindspore/train/serialization.py:1383] base_model.encoder.block.14.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.255.558 [mindspore/train/serialization.py:1383] base_model.encoder.block.14.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.255.885 [mindspore/train/serialization.py:1383] base_model.encoder.block.14.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.256.197 [mindspore/train/serialization.py:1383] base_model.encoder.block.14.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.256.525 [mindspore/train/serialization.py:1383] base_model.encoder.block.14.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.256.868 [mindspore/train/serialization.py:1383] base_model.encoder.block.14.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.257.190 [mindspore/train/serialization.py:1383] base_model.encoder.block.15.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.257.532 [mindspore/train/serialization.py:1383] base_model.encoder.block.15.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.257.851 [mindspore/train/serialization.py:1383] base_model.encoder.block.15.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.258.188 [mindspore/train/serialization.py:1383] base_model.encoder.block.15.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.258.514 [mindspore/train/serialization.py:1383] base_model.encoder.block.15.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.258.827 [mindspore/train/serialization.py:1383] base_model.encoder.block.15.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.259.168 [mindspore/train/serialization.py:1383] base_model.encoder.block.15.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.259.481 [mindspore/train/serialization.py:1383] base_model.encoder.block.15.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.259.815 [mindspore/train/serialization.py:1383] base_model.encoder.block.15.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.260.139 [mindspore/train/serialization.py:1383] base_model.encoder.block.16.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.260.466 [mindspore/train/serialization.py:1383] base_model.encoder.block.16.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.260.797 [mindspore/train/serialization.py:1383] base_model.encoder.block.16.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.261.121 [mindspore/train/serialization.py:1383] base_model.encoder.block.16.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.261.459 [mindspore/train/serialization.py:1383] base_model.encoder.block.16.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.261.784 [mindspore/train/serialization.py:1383] base_model.encoder.block.16.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.262.122 [mindspore/train/serialization.py:1383] base_model.encoder.block.16.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.262.447 [mindspore/train/serialization.py:1383] base_model.encoder.block.16.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.262.768 [mindspore/train/serialization.py:1383] base_model.encoder.block.16.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.263.080 [mindspore/train/serialization.py:1383] base_model.encoder.block.17.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.263.409 [mindspore/train/serialization.py:1383] base_model.encoder.block.17.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.263.730 [mindspore/train/serialization.py:1383] base_model.encoder.block.17.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.264.070 [mindspore/train/serialization.py:1383] base_model.encoder.block.17.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.264.375 [mindspore/train/serialization.py:1383] base_model.encoder.block.17.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.264.715 [mindspore/train/serialization.py:1383] base_model.encoder.block.17.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.265.036 [mindspore/train/serialization.py:1383] base_model.encoder.block.17.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.265.353 [mindspore/train/serialization.py:1383] base_model.encoder.block.17.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.265.692 [mindspore/train/serialization.py:1383] base_model.encoder.block.17.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.266.001 [mindspore/train/serialization.py:1383] base_model.encoder.block.18.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.266.330 [mindspore/train/serialization.py:1383] base_model.encoder.block.18.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.266.659 [mindspore/train/serialization.py:1383] base_model.encoder.block.18.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.266.971 [mindspore/train/serialization.py:1383] base_model.encoder.block.18.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.267.305 [mindspore/train/serialization.py:1383] base_model.encoder.block.18.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.267.625 [mindspore/train/serialization.py:1383] base_model.encoder.block.18.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.267.957 [mindspore/train/serialization.py:1383] base_model.encoder.block.18.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.268.279 [mindspore/train/serialization.py:1383] base_model.encoder.block.18.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.268.614 [mindspore/train/serialization.py:1383] base_model.encoder.block.18.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.268.935 [mindspore/train/serialization.py:1383] base_model.encoder.block.19.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.269.280 [mindspore/train/serialization.py:1383] base_model.encoder.block.19.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.269.614 [mindspore/train/serialization.py:1383] base_model.encoder.block.19.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.269.932 [mindspore/train/serialization.py:1383] base_model.encoder.block.19.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.270.261 [mindspore/train/serialization.py:1383] base_model.encoder.block.19.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.270.582 [mindspore/train/serialization.py:1383] base_model.encoder.block.19.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.270.924 [mindspore/train/serialization.py:1383] base_model.encoder.block.19.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.271.251 [mindspore/train/serialization.py:1383] base_model.encoder.block.19.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.271.566 [mindspore/train/serialization.py:1383] base_model.encoder.block.19.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.271.907 [mindspore/train/serialization.py:1383] base_model.encoder.block.20.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.272.231 [mindspore/train/serialization.py:1383] base_model.encoder.block.20.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.272.543 [mindspore/train/serialization.py:1383] base_model.encoder.block.20.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.272.882 [mindspore/train/serialization.py:1383] base_model.encoder.block.20.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.273.200 [mindspore/train/serialization.py:1383] base_model.encoder.block.20.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.273.537 [mindspore/train/serialization.py:1383] base_model.encoder.block.20.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.273.849 [mindspore/train/serialization.py:1383] base_model.encoder.block.20.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.274.185 [mindspore/train/serialization.py:1383] base_model.encoder.block.20.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.274.510 [mindspore/train/serialization.py:1383] base_model.encoder.block.20.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.274.822 [mindspore/train/serialization.py:1383] base_model.encoder.block.21.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.275.151 [mindspore/train/serialization.py:1383] base_model.encoder.block.21.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.275.491 [mindspore/train/serialization.py:1383] base_model.encoder.block.21.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.275.795 [mindspore/train/serialization.py:1383] base_model.encoder.block.21.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.276.135 [mindspore/train/serialization.py:1383] base_model.encoder.block.21.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.276.452 [mindspore/train/serialization.py:1383] base_model.encoder.block.21.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.276.793 [mindspore/train/serialization.py:1383] base_model.encoder.block.21.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.277.121 [mindspore/train/serialization.py:1383] base_model.encoder.block.21.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.277.431 [mindspore/train/serialization.py:1383] base_model.encoder.block.21.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.277.761 [mindspore/train/serialization.py:1383] base_model.encoder.block.22.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.278.089 [mindspore/train/serialization.py:1383] base_model.encoder.block.22.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.278.429 [mindspore/train/serialization.py:1383] base_model.encoder.block.22.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.278.750 [mindspore/train/serialization.py:1383] base_model.encoder.block.22.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.279.079 [mindspore/train/serialization.py:1383] base_model.encoder.block.22.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.279.395 [mindspore/train/serialization.py:1383] base_model.encoder.block.22.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.279.723 [mindspore/train/serialization.py:1383] base_model.encoder.block.22.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.280.064 [mindspore/train/serialization.py:1383] base_model.encoder.block.22.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.280.376 [mindspore/train/serialization.py:1383] base_model.encoder.block.22.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.280.705 [mindspore/train/serialization.py:1383] base_model.encoder.block.23.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.281.050 [mindspore/train/serialization.py:1383] base_model.encoder.block.23.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.281.387 [mindspore/train/serialization.py:1383] base_model.encoder.block.23.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.281.712 [mindspore/train/serialization.py:1383] base_model.encoder.block.23.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.282.039 [mindspore/train/serialization.py:1383] base_model.encoder.block.23.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.282.352 [mindspore/train/serialization.py:1383] base_model.encoder.block.23.layer.1.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.282.687 [mindspore/train/serialization.py:1383] base_model.encoder.block.23.layer.1.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.283.002 [mindspore/train/serialization.py:1383] base_model.encoder.block.23.layer.1.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.283.341 [mindspore/train/serialization.py:1383] base_model.encoder.block.23.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.283.666 [mindspore/train/serialization.py:1383] base_model.encoder.final_layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.283.990 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.284.303 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.284.623 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.284.947 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.285.278 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.0.SelfAttention.relative_attention_bias.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.285.604 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.285.930 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.286.260 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.286.587 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.286.900 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.287.225 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.287.555 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.287.897 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.288.284 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.288.622 [mindspore/train/serialization.py:1383] base_model.decoder.block.0.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.288.933 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.289.289 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.289.603 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.289.934 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.290.267 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.290.592 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.290.917 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.291.243 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.291.555 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.291.892 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.292.210 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.292.535 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.292.882 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.308.830 [mindspore/train/serialization.py:1383] base_model.decoder.block.1.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.309.321 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.309.653 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.309.982 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.310.311 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.310.636 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.310.951 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.311.283 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.311.605 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.311.949 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.312.267 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.312.598 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.312.914 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.313.263 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.313.587 [mindspore/train/serialization.py:1383] base_model.decoder.block.2.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.313.915 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.314.239 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.314.548 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.314.887 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.315.212 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.315.526 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.315.868 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.316.184 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.316.502 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.316.843 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.317.156 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.317.498 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.317.807 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.318.150 [mindspore/train/serialization.py:1383] base_model.decoder.block.3.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.318.456 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.318.801 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.319.112 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.319.450 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.319.767 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.320.093 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.320.422 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.320.762 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.321.094 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.321.426 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.321.749 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.322.054 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.322.380 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.322.711 [mindspore/train/serialization.py:1383] base_model.decoder.block.4.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.323.031 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.323.372 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.323.684 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.324.006 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.324.359 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.324.689 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.325.002 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.325.347 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.325.662 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.326.003 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.329.648 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.329.987 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.330.315 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.330.640 [mindspore/train/serialization.py:1383] base_model.decoder.block.5.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.330.976 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.331.313 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.331.629 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.331.962 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.332.289 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.332.615 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.332.933 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.333.284 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.333.614 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.333.939 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.334.267 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.334.592 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.334.934 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.335.261 [mindspore/train/serialization.py:1383] base_model.decoder.block.6.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.336.779 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.337.232 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.337.548 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.337.876 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.338.206 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.338.528 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.338.858 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.339.189 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.339.502 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.339.837 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.340.150 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.340.474 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.340.797 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.341.183 [mindspore/train/serialization.py:1383] base_model.decoder.block.7.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.341.538 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.341.851 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.342.193 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.342.506 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.342.834 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.343.155 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.343.498 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.343.807 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.344.146 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.344.475 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.344.784 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.345.104 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.345.441 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.345.767 [mindspore/train/serialization.py:1383] base_model.decoder.block.8.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.346.104 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.346.428 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.346.749 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.347.075 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.347.398 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.347.723 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.348.043 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.348.371 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.348.676 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.349.013 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.349.464 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.349.830 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.350.141 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.350.463 [mindspore/train/serialization.py:1383] base_model.decoder.block.9.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.350.798 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.351.115 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.351.444 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.351.770 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.352.099 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.352.439 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.352.749 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.353.068 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.353.403 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.353.731 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.354.056 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.354.397 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.354.711 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.355.040 [mindspore/train/serialization.py:1383] base_model.decoder.block.10.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.355.378 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.355.707 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.356.029 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.356.357 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.356.683 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.357.023 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.357.356 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.357.682 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.357.992 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.358.331 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.358.642 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.358.969 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.359.296 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.359.613 [mindspore/train/serialization.py:1383] base_model.decoder.block.11.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.359.933 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.360.273 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.360.585 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.360.928 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.361.256 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.361.584 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.361.900 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.362.226 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.362.564 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.362.890 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.363.207 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.363.527 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.363.848 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.364.183 [mindspore/train/serialization.py:1383] base_model.decoder.block.12.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.364.496 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.364.832 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.365.155 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.365.483 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.365.807 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.366.150 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.372.128 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.372.465 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.372.795 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.373.135 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.373.451 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.373.773 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.374.097 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.374.417 [mindspore/train/serialization.py:1383] base_model.decoder.block.13.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.374.758 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.375.072 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.375.407 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.375.726 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.376.038 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.376.356 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.376.700 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.377.011 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.377.359 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.377.677 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.378.011 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.378.322 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.378.644 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.378.972 [mindspore/train/serialization.py:1383] base_model.decoder.block.14.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.379.339 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.379.667 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.379.999 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.380.329 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.380.673 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.380.998 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.381.318 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.381.661 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.381.980 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.382.303 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.382.643 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.382.955 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.383.279 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.383.620 [mindspore/train/serialization.py:1383] base_model.decoder.block.15.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.383.930 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.384.268 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.384.574 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.384.901 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.385.233 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.385.576 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.385.889 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.386.224 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.386.549 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.386.866 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.387.212 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.387.522 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.387.841 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.388.170 [mindspore/train/serialization.py:1383] base_model.decoder.block.16.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.388.496 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.388.821 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.389.177 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.389.508 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.389.834 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.390.159 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.390.471 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.390.813 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.391.139 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.391.450 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.391.771 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.392.099 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.392.425 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.392.761 [mindspore/train/serialization.py:1383] base_model.decoder.block.17.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.393.069 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.393.424 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.393.751 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.394.072 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.394.378 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.394.699 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.395.045 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.395.347 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.395.671 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.396.005 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.396.313 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.396.634 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.396.967 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.397.305 [mindspore/train/serialization.py:1383] base_model.decoder.block.18.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.397.620 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.397.959 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.398.283 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.398.611 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.398.931 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.399.252 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.399.592 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.399.901 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.400.224 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.406.048 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.406.498 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.406.938 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.407.249 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.407.573 [mindspore/train/serialization.py:1383] base_model.decoder.block.19.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.407.916 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.408.227 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.408.550 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.408.890 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.409.225 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.409.542 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.409.858 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.410.205 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.410.481 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.410.817 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.411.139 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.411.473 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.411.819 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.412.139 [mindspore/train/serialization.py:1383] base_model.decoder.block.20.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.412.465 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.412.767 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.413.054 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.413.359 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.413.699 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.413.977 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.414.320 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.414.640 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.414.986 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.415.311 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.415.603 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.415.932 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.416.281 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.416.594 [mindspore/train/serialization.py:1383] base_model.decoder.block.21.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.416.927 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.417.248 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.417.570 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.417.905 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.418.243 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.418.579 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.418.913 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.419.248 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.419.598 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.422.711 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.423.032 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.423.344 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.423.634 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.423.942 [mindspore/train/serialization.py:1383] base_model.decoder.block.22.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.424.271 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.0.SelfAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.424.569 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.0.SelfAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.424.909 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.0.SelfAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.425.219 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.0.SelfAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.425.545 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.0.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.425.890 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.1.EncDecAttention.q.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.426.229 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.1.EncDecAttention.k.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.426.553 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.1.EncDecAttention.v.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.426.847 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.1.EncDecAttention.o.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.427.197 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.1.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.427.519 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.2.DenseReluDense.wi_0.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.427.818 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.2.DenseReluDense.wi_1.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.428.149 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.2.DenseReluDense.wo.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.428.471 [mindspore/train/serialization.py:1383] base_model.decoder.block.23.layer.2.layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.428.818 [mindspore/train/serialization.py:1383] base_model.decoder.final_layer_norm.weight is not loaded.\n",
      "[WARNING] ME(19505:139997890737984,MainProcess):2024-05-23-10:19:04.429.176 [mindspore/train/serialization.py:1383] base_model.lm_head.weight is not loaded.\n"
     ]
    }
   ],
   "source": [
    "from mindnlp.peft import PeftModel, PeftConfig\n",
    "\n",
    "peft_model_id = f\"{model_name_or_path}_{peft_config.peft_type}_{peft_config.task_type}\"\n",
    "\n",
    "config = PeftConfig.from_pretrained(peft_model_id)\n",
    "model = AutoModelForSeq2SeqLM.from_pretrained(config.base_model_name_or_path)\n",
    "model = PeftModel.from_pretrained(model, peft_model_id)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "37d712ce",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "neutral\n",
      "{'input_ids': Tensor(shape=[1, 2], dtype=Int64, value=\n",
      "[[59006,     1]]), 'attention_mask': Tensor(shape=[1, 2], dtype=Int64, value=\n",
      "[[1, 1]])}\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/daiyuxin/miniconda3/envs/ms2.0/lib/python3.8/site-packages/mindnlp/transformers/generation/utils.py:1402: UserWarning: You have modified the pretrained model configuration to control generation. This is a deprecated strategy to control generation. Please use and modify the model generation configuration (see https://hf-mirror.com/docs/transformers/generation_strategies#default-text-generation-configuration )\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[[    0 59006     1]]\n",
      "['neutral']\n"
     ]
    }
   ],
   "source": [
    "model.set_train(False)\n",
    "example = next(validation_dataset.create_dict_iterator(output_numpy=True))\n",
    "\n",
    "print(example['text_label'])\n",
    "inputs = tokenizer(example['text_label'], return_tensors=\"ms\")\n",
    "print(inputs)\n",
    "\n",
    "with mindspore._no_grad():\n",
    "    outputs = model.generate(input_ids=inputs[\"input_ids\"], max_new_tokens=10)\n",
    "    print(outputs)\n",
    "    print(tokenizer.batch_decode(outputs.asnumpy(), skip_special_tokens=True))"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "mathglm",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
